export const dataPipelines = {
  "toSel": "請選擇",
  "toInput": "請輸入",
  "noData": "暫無數據",
  "saveConfiguration": "保存配置",
  "dataAcquisition": "數據採集",
  "dataCollectionTask": "數據採集任務",
  "dataSourceManagement": "數據源管理",
  "formatConversion": "格式轉換",
  "dataFormatConversion": "資料格式轉換",
  "taskDescription": "任務描述",
  "sourceFormat": "來源格式",
  "targetFormat": "目標格式",
  "dataFlowBranch": "資料流向分支",
  "startExecution": "開始執行",
  "searchTaskName": "搜尋任務名稱",
  "confirmTermination": "確認終止",
  "terminate": "終止",
  "waiting": "等待中",
  "error": "錯誤",
  "taskStatus": "任務狀態",
  "labelStudio": "資料標註",
  "dataSourceInfo": {
    "Mysql": {
      "title": "關係型數據庫(MySQL)",
      "desc": "批量導入數據庫表，支援自定義表、欄位"
    },
    "Mongodb": {
      "title": "非關係型數據庫(MongoDB)",
      "desc": "導入非關係型數據，支援集合、欄位選擇和結構轉換"
    },
    "File": {
      "title": "文件數據導入",
      "desc": "支援CSV、Excel、JSON等多種格式文件導入"
    },
    "Hive": {
      "title": "Hive系統導入",
      "desc": "高效讀取hive系統中存儲的數據"
    }
  },
  "testingConnection": "正在測試連接",
  "pleaseSelectAnExecutionTime": "請選擇執行時間",
  "deletingTask": "正在刪除任務",
  "terminatingTask": "正在終止任務",
  "createTask": "創建任務",
  "addDataSource": "添加數據源",
  "fileFormat": "文件格式",
  "connectionStatus": "連接狀態",
  "dataSourceType": "數據源類型",
  "searchDataSources": "搜索數據源",
  "searchNameOrDescription": "搜索名稱",
  "dataProcessing": "數據處理",
  "dataProcessingConfiguration": "數據處理配置",
  "taskFlowConfiguration": "任務流配置",
  "dataExportConfiguration": "數據導出配置",
  "taskExecuted": "任務已執行",
  "taskExecutionFailed": "任務執行失敗",
  "cannotCancel": "任務處理中，無法取消",
  "taskSuccessStop": "任務已成功停止",
  "taskStopFailed": "任務停止失敗",
  "processingResult": "處理結果",
  "algorithmTemplate": "算法模板",
  "builtInTemplate": "內置模板",
  "customTemplate": "自定義模板",
  "operatorManagement": "算子管理",
  "systemDashboard": "系統儀表盤",
  "concurrentTaskMonitoring": "併發任務監控",
  "myAlgorithmTemplate": "我的算法模板",
  "createAlgorithmTemplate": "創建算法模板",
  "dataProcessingDescription": "數據處理可支持用戶使用不同的模型算子，針對大模型所用的數據進行處理，包括數據清洗、自動數據增強及分析等處理方式，用戶可通過數據處理來獲取更高質量的數據",
  "nodeName": "節點名稱",
  "nodeConfig": "節點配置",
  "nodeType": "節點類型",
  "nodeNotSelected": "未選擇節點",
  "fieldRequired": "{field}為必填項",
  "noNodesError": "工作流中未存在任何節點",
  "unnamedNode": "未命名節點({id})",
  "unconnectedNodeError": "{nodeName}節點：尚未連接任何其他節點",
  "invalidConfigError": "{nodeName}節點：配置無效，請檢查必填項",
  "configRequiredError": "{nodeName}節點的【{configName}】是必填項，請填寫完整",
  "saveError": "保存工作流時出錯",
  "noMatchingNodeFound": "未找到匹配的節點",
  "searchProcessing": "搜索處理任務",
  "zoomIn": "放大",
  "zoomOut": "缩小",
  "resetView": "重置視圖",
  "clearCanvas": "清除畫布",
  "operationGuide": "操作指南",
  "operationGuide1": "從左側拖拽節點到右側畫布區域",
  "operationGuide2": "點擊節點上的連接點並拖動到另一個節點來創建連接",
  "operationGuide3": "拖拽節點可以調整位置",
  "operationGuide4": "鼠標懸停節點顯示刪除按鈕",
  "operationGuide5": "點擊刪除按鈕或按Delete鍵刪除選中節點",
  "configInfo": "配置信息",
  "search": "搜索",
  "loading": "加載中",
  "taskCategories": "任務分類",
  "allCategories": "全部分類",
  "taskList": "任務列表",
  "taskName": "任務名稱",
  "DatabaseName": "數據庫名稱",
  "ServerAddress": "服務器地址",
  "port": "端口號",
  "username": "用戶名",
  "password": "密碼",
  "authType": "鑒權類型",
  "collectionSourceName": "採集源名稱",
  "server": "服務器",
  "database": "數據庫",
  "task": "任務",
  "dataSourceDetails": "數據源詳情",
  "close": "關閉",
  "operationSuccessful": "操作成功",
  "operationFailed": "操作失敗",
  "basicInformation": "基本信息",
  "dataSourceName": "數據源名稱",
  "lastUpdate": "最後更新",
  "normal": "正常",
  "toBeTested": "待測試",
  "anomaly": "異常",
  "useRecord": "使用記錄",
  "dataImportTask": "数据导入任务",
  "persons": "個",
  "recentlyUsed": "最近使用",
  "dataVolume": "數據量",
  "total": "總",
  "startAt": "開始於",
  "done": "完成",
  "taskRunningHost": "任務運行主機",
  "recordsHaveBeenImported": "已導入記錄",
  "totalNumberOfRecords": "總記錄數",
  "cancelTask": "取消任務",
  "refreshStatus": "刷新狀態",
  "viewLog": "查看日誌",
  "resourceOccupation": "資源佔用",
  "RunItAgain": "重新運行",
  "dataConnectionConfiguration": "數據連接配置",
  "authType_option_NONE": "不做身份校驗",
  "authType_option_LDAP": "使用基於 LDAP/AD 的用戶身份校驗",
  "authType_option_KERBEROS": "使用 Kerberos/GSSAPI 做身份校驗",
  "authType_placeholder": "目前只支持 LDAP 模式",
  "collectionSourceDesc": "採集源描述",
  "testLink": "測試連接",
  "dataFilteringConfiguration": "數據篩選配置",
  "selectionSet": "選擇集合",
  "searchForTheTableName": "搜索表名稱",
  "allFields": "全部字段",
  "selectAll": "全選",
  "saveTheConfiguration": "保存配置",
  "saveAndExecute": "保存並執行",
  "executeImmediately": "立即執行",
  "selectTheExecutionTime": "選擇執行時間",
  "sure": "確定",
  "PleaseSelectTime": "請選擇時間",
  "fileUpload": "文件上傳",
  "jumpLink": "跳轉鏈接",
  "linkSuccess": "連接成功",
  "linkError": "連接失敗",
  "connectionInformation": "連結資訊",
  "TaskFailed": "任務失敗",
  "manualStop": "手動停止",
  "public": "公開",
  "private": "私有",

  "createTime": "創建時間",
  "dataAmount": "數據量",
  "finishTime": "完成時間",
  "processedDataAmount": "已處理數據量",
  "processInfo": "處理詳情",
  "processStatus": "運行狀態",
  "processedData": "已處理數據",
  "graphicDemonstration": "圖形化演示",
  "sessionProcessedResult": "Session處理結果",
  "index": "序號",
  "preSession": "處理前Session",
  "processType": "處理方式",
  "afterSession": "處理後Session",
  "taskLog": "任務日誌",
  "logName": "日誌名稱",
  "downloadLog": "下載日誌",
  "others": "其他",
  "replace": "替換",
  "deduplicate": "去重",
  "remove": "刪除",
  "data_refine": "數據處理",
  "Internal": "內部",
  "data_generation": "數據生成",
  "data_enhancement": "數據增強",

  "data_source": "數據源",
  "execution_completed_normally": "執行結束（正常）",
  "execution_end_error": "執行結束（錯誤）",
  "stopped": "已停止",
  "celery_node_service_list": "Celery 節點服務列表",
  "ip_address": "IP 地址",
  "current_number_tasks": "當前任務數",
  "node_status": "節點狀態",
  "heartbeat_time": "心跳時間",

  "taskType": "任務類型",
  "dataCleaning": "數據清洗",
  "processingStatus": "處理狀態",
  "processingText": "處理字段",
  "inProgress": "處理中",
  "completed": "已完成",
  "dataSource": "數據來源",
  "dataSourceBranch": "數據來源分支",
  "dataFlow": "數據流向",
  "startTime": "開始時間",
  "endTime": "結束時間",
  "executionStatus": {
    "success": "執行完成",
    "error": "執行失敗",
    "processing": "正在執行",
    "wainting": "等待執行",
  },
  "unknown": "未知",
  "online": "在線",
  "offline": "離線",
  "operations": "操作",
  "delete": "刪除",
  "deleteConfirm": "確認刪除",
  "cancelConfirm": "確認取消",
  "rerunItConfirm": "確認重新運行",
  "execute": "執行",
  "cancelExecute": "取消執行",
  "executeConfirm": "確認執行",
  "confirm": "確認",
  "reset": "替換",
  "details": "詳情",
  "authorize": "授权",
  "settings": "設置",
  "operatorAuthorization": "算子授權",
  "SearchUserName": "搜索用戶名稱",
  "SearchOrganizationName": "搜索組織名稱",
  "person": "個人",
  "organization": "組織",
  "selected": "已選",
  "editIcon": "編輯圖標",
  "iconPreview": "圖標預覽",
  "please": "請",
  "uploadTips1": "支持JPG、PNG格式圖標，最大不超過10MB",
  "uploadTips2": "已上傳新圖標，可繼續上傳替換或點擊確定保存",
  "uploadIcon": "上傳圖標",
  "uploadStatusTips1": "點擊或拖拽圖標到此處",
  "uploadStatusTips2": "上傳後將替換當前圖標",
  "uploading": "正在上傳",
  "uploadSuccess": "上傳成功",
  "uploadSuccessTips1": "可繼續上傳替換或點擊確定保存",
  "reUpload": "重新上傳",
  "uploadFailed": "上傳失敗",
  "retry": "重試",
  "uploadSuccessTips2": "圖標上傳成功",
  "uploadFailedTips1": "請上傳JPG或PNG格式的圖標",
  "uploadFailedTips2": "圖標大小不能超過10MB",
  "uploadFailedTips3": "上傳失敗，請重試",
  "networkError": "網絡錯誤，請檢查連接後重試",
  "submitting": "保存中",
  "algorithmTemplateDescription": "算法模版可支持用戶使用多種不同的模型算子組成工作流，完成數據清洗、自動數據增強及分析等工作。",
  "taskTemplate": "任務模板",
  "templateName": "模板名稱",
  "templateDescription": "模板描述",
  "searchTaskTemplate": "搜索任務模板",
  "searchTemplate": "搜索模板",
  "searchOperator": "搜索算子",
  "nextStep": "下一步",
  "previousStep": "上一步",
  "create": "創建",
  "edit": "修改",
  "type": "類型",
  "copy": "複製",
  "use": "使用",
  "templateList": "模板列表",
  "createTemplate": "創建模板",
  "editTemplate": "修改模板",
  "general": "通用",
  "dataCleaningDescription": "通過去重、去敏等多種算子，清洗數據，使數據滿足使用需求",
  "dataAugmentation": "數據增強",
  "dataAugmentationDescription": "基於種子數據自動化生成更多數據，可用於訓練數據生成，支持自定義參數及Prompt",
  "textClassification": "文本分類",
  "textClassificationDescription": "增強文本分類任務的訓練數據，適用於情感分類、標籤分類、商品分類等場景",
  "textExtraction": "文本抽取",
  "textExtractionDescription": "增強文本抽取類任務的訓練數據，適用於特定格式抽取、實體抽取、要素提取等場景",
  "textGeneration": "文本創作",
  "textGenerationDescription": "增強文本創作類任務的訓練數據，適用於新聞寫作、廣告稿生成、寫作內容風格化等場景",
  "apply": "使用",
  "newTask": "新建任務",
  "pushToOriginalDataset": "推送到原數據集",
  "pushToOriginalDatasetDescription": "推送到原數據集後，將以新提交的方式推送到原始數據集repo中",
  "pushToNewDataset": "推送到新數據集",
  "pushToSelectedDatasetDescription": "數據清洗完成後，將推送到所選數據集",
  "targetDataset": "目標數據集名稱",
  "predefinedOperatorSelection": "預置算子選擇",
  "predefinedOperator": "預置算子",
  "peratorTip": "目前支持多種 Mapper、Filter、Deduplicator 類型的預置算子",
  "publishAsNewTemplate": "發佈為新模版",
  "executionOrder": "執行順序",
  "enableOrNot": "是否開啟",
  "addOperator": "添加算子",
  "operatorType": "算子類型",
  "operatorName": "算子名稱",
  "textNormalization": "文本標準化",
  "removeSpecialContent": "特殊內容移除",
  "maskSensitiveInformation": "敏感信息打碼",
  "specialCharacterRatioFiltering": "特殊字符佔比過濾",
  "sensitiveWordFiltering": "敏感詞過濾",
  "nGramRepetitionRatioFiltering": "N-Gram重複比率過濾",
  "lengthFiltering": "長度過濾",
  "md5Deduplication": "MD5去重",
  "articleSimilarityDeduplication": "文章相似度去重",
  "toxicityRemoval": "毒性去除",
  "operatorConfiguration": "算子配置",
  "unicodeTextNormalization": "Unicode文本標準化",
  "convertTraditionalChineseToSimplifiedChinese": "繁體轉簡體",
  "removeURLLinks": "去除URL鏈接",
  "removeInvisibleCharacters": "去除不可見字符",
  "removeHtmlTagsAndParseHtmlContent": "去除html格式字符並解析出html文本",
  "maximumRatio": "比例最大值",
  "lengthN": "長度N",
  "minimumLength": "長度最小值",
  "characters": "字符",
  "windowLength": "窗口長度",
  "description": "描述",
  "textNormalizationDesc": "文本Unicode標準化和繁體轉中文",
  "removeSpecialContentDesc": "移除文本中的特殊內容，例如文章中的url、不可見字符、html格式字符等",
  "maskSensitiveInformationDesc": "將敏感信息打碼，例如將郵箱地址字符替換成[EMAIL]，手機電話號碼替換成[TELEPHONE]或[MOBILEPHONE]，身份證號碼替換成[IDNUM]",
  "specialCharacterRatioFilteringDesc": "根據特殊字符佔比過濾文本，保留特殊字符個數佔文本總長度比例不超過設定閾值的樣本，特殊字符包括標點符號，數字，空格符號，emoji表情包等，超過設定比例的數據樣本將被過濾",
  "sensitiveWordFilteringDesc": "過濾掉帶有敏感詞的樣本",
  "nGramRepetitionRatioFilteringDesc": "保留字符級N-Gram重複比率不超過設定閾值的樣本，超過閾值的樣本將被過濾",
  "lengthFilteringDesc": "根據文本長度過濾數據，長度範圍之外的數據將被過濾",
  "md5DeduplicationDesc": "根據文本生成的MD5值對比去重，MD5校驗一致的樣本將被過濾",
  "articleSimilarityDeduplicationDesc": "使用SimHash算法計算文本間的相似度，相似度超過閾值樣本將被過濾",
  "toxicityRemovalDesc": "自動檢測分析並去除數據中敏感、不合規的內容，本算子僅對數據內容進行分析、處理，不保存、保留任何處理前、處理後的數據內容",
  "previewBefore": "效果預覽（清洗前）",
  "previewAfter": "效果預覽（清洗後）",
  "creationCompleted": "創建完成",
  "updateTemplate": "更新模板",
  "cancel": "取消",
  "templateNameExists": "模板名稱已存在，請使用其他名稱",
  "Queued": "待處理",
  "Processing": "處理中",
  "Finished": "已完成",
  "Failed": "失敗",
  "Timeout": "超時",
  "Canceled": "已取消",
  "sessionDel": "Session已刪除",

  "toolsTit": "工具池",
  "toolsDec": "Dataflow 工具池是一個一站式多模態數據處理系統，可使數據質量更高、更有價值、更適合大模型處理。",
  "toolsSearch": "搜索工具",
  "toolsType": "工具分類",
  "toolsName": "工具名稱",
  "toolsUse": "使用工具",
  "taskType1": "算子",
  "taskType2": "工具",
  "log": "日誌",
  "toolsTab1": "內部工具",
  "toolsTab2": "外部工具",

  "analysis_common_internal": "通用分析工具",
  "dataset_spliter_by_language_preprocess_internal": "數據集按語言分割預處理工具",
  "prepare_dataset_from_repo_preprocess_internal": "從代碼倉庫準備數據集預處理工具",
  "raw_alpaca_cot_merge_add_meta_preprocess_internal": "原始Alpaca-Cot數據合併與元數據添加預處理工具",
  "raw_arxiv_to_jsonl_preprocess_internal": "原始arXiv數據轉換為JSONL預處理工具",
  "raw_stackexchange_to_jsonl_preprocess_internal": "原始Stack Exchange數據轉換為JSONL預處理工具",
  "reformat_csv_nan_value_preprocess_internal": "CSV文件NaN值重格式化預處理工具",
  "reformat_jsonl_nan_value_preprocess_internal": "JSONL文件NaN值重格式化預處理工具",
  "serialize_meta_preprocess_internal": "元數據序列化預處理工具",
  "count_token_postprocess_internal": "令牌計數後處理工具",
  "data_mixture_postprocess_internal": "數據混合後處理工具",
  "deserialize_meta_postprocess_internal": "元數據反序列化後處理工具",
  "quality_classifier_common_internal": "質量分類器通用",
  "opencsg_data_extraction_preprocess_internal": "開放計算系統數據提取預處理",
  "opencsg_scrape_url_data_preprocess_internal": "開放計算系統抓取 URL 數據預處理",
  "fineweb_edu_chinese_common_internal": "文本價值評估",
  "smoltalk_chinese_common_internal": "高質量對話生成",
  "cosmopedia_chinese_preprocess_internal": "增強文本描述工具",

  "analysis_common_internal_dec": "此分析器類用於分析特定數據集。它會為配置文件中的所有過濾操作計算統計數據，對這些統計數據應用多種分析（如整體分析、逐列分析等），並生成分析結果（統計表、分佈圖等），幫助用戶更好地理解輸入數據集。",
  "dataset_spliter_by_language_preprocess_internal_dec": "從源目錄加載數據集，然後使用名為 LanguageIDScoreFilter 的操作過濾器進行語言識別，最後按語言分割數據集並保存。",
  "prepare_dataset_from_repo_preprocess_internal_dec": "從代碼倉庫中準備數據集，格式包括：倉庫名稱、倉庫中的文件路徑、文件內容。",
  "raw_alpaca_cot_merge_add_meta_preprocess_internal_dec": "將從Hugging Face下載的原始Alpaca-Cot數據轉換為JSONL文件，合併指令/輸入/輸出文本，並添加元數據信息。",
  "raw_arxiv_to_jsonl_preprocess_internal_dec": "將原始arXiv數據（gzipped tar文件）轉換為JSONL格式。",
  "raw_stackexchange_to_jsonl_preprocess_internal_dec": "將從Archive（參考：https://archive.org/download/stackexchange）下載的原始Stack Exchange數據轉換為多個JSONL文件。",
  "reformat_csv_nan_value_preprocess_internal_dec": "使用Hugging Face加載可能包含NaN值的CSV或TSV文件，並可通過設置額外參數（如設置 	keep_default_na 為False）進行處理。",
  "reformat_jsonl_nan_value_preprocess_internal_dec": "重格式化可能包含NaN值的JSONL文件。遍歷JSONL文件，找到第一個不包含NaN的對象作為參考特徵類型，並將其設置為加載所有JSONL文件時的基準。",
  "serialize_meta_preprocess_internal_dec": "序列化JSONL文件中除用戶指定字段以外的所有字段，確保即使JSONL文件中每行文本格式不一致，數據集仍可正常加載。",
  "count_token_postprocess_internal_dec": "統計給定數據集和分詞器的令牌數量。目前僅支持JSONL格式。",
  "data_mixture_postprocess_internal_dec": "將多個數據集混合成一個數據集。隨機選擇每個數據集的樣本並混合這些樣本，然後導出為新的混合數據集。支持的格式包括：[“jsonl”, “json”, “parquet”]。",
  "deserialize_meta_postprocess_internal_dec": "對JSONL文件中的指定字段進行反序列化處理。",
  "quality_classifier_common_internal_dec": "本質量分類器類用於預測數據集中文檔的評分。它將計算所有行的分數，並為每一行提供兩列：分數（score）和是否保留（should_keep），以幫助用戶決定應該刪除哪一行。默認情況下，如果分數高於 0.9，則將該行標記為 should_keep=1。",
  "opencsg_data_extraction_preprocess_internal_dec": "一個高質量的工具，用於將 PDF 轉換為 Markdown 和 JSON",
  "opencsg_scrape_url_data_preprocess_internal_dec": "基於大型語言模型的網站和本地文檔（XML、HTML、JSON 等）的數據抓取工具",
  "fineweb_edu_chinese_common_internal_dec": "用戶可以定義自己的評分標準，根據這些標準對數據源中的數據進行評分，並過濾數據。最高分是5分。",
  "smoltalk_chinese_common_internal_dec": "使用固定的system_prompt生成具有大型模型的相關多輪對話並對其進行評分。根據用戶指定的分數過濾數據，只保留分數最高的數據。",
  "cosmopedia_chinese_preprocess_internal_dec": "使用MakeCosmopediaMapper操作符將原始文本轉換為WikiHow樣式的詳細教程。此工具調用大型語言模型，根據輸入的種子文本生成結構化教程內容。",
}